
@Article{chow:68,
  author = 	 {C. K. Chow and C. N. Liu},
  title = 	 {Approximating discrete probability distributions with dependence trees},
  journal = 	 {IEEE Transactions on Information Theory},
  year = 	 {1968},
  volume = 	 {IT-14},
  number = 	 {3},
  pages = 	 {462--467}}
  
  @ARTICLE{rlsurvey,
    author = {Leslie Pack Kaelbling and Michael L. Littman and Andrew W. Moore},
    title = {Reinforcement learning: a survey},
    journal = {Journal of Artificial Intelligence Research},
    year = {1996},
    volume = {4},
    pages = {237--285}
}

@book{ndp,
	author = {Bertsekas, Dimitri  P.  and Tsitsiklis, John  N. },
	citeulike-article-id = {206209},
	howpublished = {Hardcover},
	isbn = {1886529108},
	keywords = {optimization, programming, reinforcement},
	month = {May},
	posted-at = {2007-07-27 20:43:16},
	priority = {3},
	publisher = {{Athena Scientific}},
	title = {Neuro-Dynamic Programming (Optimization and Neural Computation Series, 3)},
	year = {1996}
}

@Book{rlbook,
  author = 	 {Richard S. Sutton and Andrew G. Bartol},
  title = 	 {Reinforcement {L}earning: 
		  {A}n {I}ntroduction },
  publisher = 	 {The MIT Press},
  year = 	 {1998},
  address = 	 {Cambridge, Massachusetts}
} 

@Book{mitchell:97,
  author = 	 {Tom M. Mitchell},
  title = 	 {Machine {L}earning},
  publisher = 	 {McGraw Hill},
  year = 	 {1997},
  address = 	 {New York, New York}
} 

@inproceedings{ smart:00,
    author = {William D. Smart and Leslie Pack Kaelbling},
    title = {Practical Reinforcement Learning in Continuous Spaces},
    booktitle = {Proc. 17th International Conf. on Machine Learning},
    publisher = {Morgan Kaufmann, San Francisco, CA},
    pages = {903--910},
    year = {2000}}
    
@inproceedings{ boyan:95,
    author = {Justin A. Boyan and Andrew W. Moore},
    title = {Generalization in Reinforcement Learning: {S}afely Approximating the Value Function},
    booktitle = {Advances in Neural Information Processing Systems 7},
    publisher = {The MIT Press},
    address = {Cambridge, MA},
    editor = {G. Tesauro and D. S. Touretzky and T. K. Leen},
    pages = {369--376},
    year = {1995}}
    
  @inproceedings{wiewiora:03,
  author    = {Eric Wiewiora and Garrison W. Cottrell and Charles Elkan},
  title     = {Principled Methods for Advising Reinforcement Learning Agents.},
  booktitle = {International Conference on Machine Learning},
  year      = {2003},
  pages     = {792--799}}
  
  @phdthesis{moore:90,
    author = {A. W. Moore},
    title = {Efficient Memory-based Learning for Robot Control},
    address = {Cambridge, UK},
    school = {University of Cambridge},
    year = {1990}}
    
      @ MastersThesis{whitethesis,
    author = {Adam White},
    title = {A {S}tandard {S}ystem for {B}enchmarking in {R}einforcement {L}earning},
    address = {Alberta, Canada},
    school = {University of Alberta},
    year = {2006}}
    
    
 @article{singh:96,
    author = {Satinder P. Singh and Richard S. Sutton},
    title = {Reinforcement Learning with Replacing Eligibility Traces},
    journal = {Machine Learning},
    volume = {22},
    number = {1--3},
    pages = {123--158},
    year = {1996}}
    
     @article{whitesutton,
    author = {Adam White and Richard S. Sutton},
    title = {The {RL}-{G}lue {P}rotocol: a {C}ommunication {S}tandard for {R}einforcement {L}earning {E}xperiments},
    journal = {Journal of Machine Learning Research},
    volume = {??},
    number = {??},
    pages = {??},
    year = {2009}}
    
@inproceedings{riedmiller:05,
  author    = {Martin Riedmiller},
  title     = {Neural Fitted Q Iteration - First Experiences with a Data Efficient Neural Reinforcement Learning Method.},
  booktitle = {European Conference on Machine Learning},
  year      = {2005},
  pages     = {317-328}}
  
@phdthesis{bagnell:04,
   author = {James Bagnell},
   title = {Learning Decisions: Robustness, Uncertainty, and Approximation},
   school = {Robotics Institute, Carnegie Mellon University},
   month = {August},
   year = {2004},
   address = {Pittsburgh, PA}}
  
  @inproceedings{ sutton:96,
    author = {Richard S. Sutton},
    title = {Generalization in Reinforcement Learning: Successful Examples Using Sparse Coarse Coding},
    booktitle = {Advances in Neural Information Processing Systems},
    volume = {8},
    publisher = {The {MIT} Press},
    editor = {David S. Touretzky and Michael C. Mozer and Michael E. Hasselmo},
    pages = {1038--1044},
    year = {1996}}  
    
@misc{uci:98,
author = {D.J. Newman, S. Hettich, C.L. Blake and C.J. Merz},
year = {1998},
title = {{UCI} Repository of machine learning databases},
url = {http://www.ics.uci.edu/$\sim$mlearn/MLRepository.html},
institution = {University of California, Irvine, Dept. of Information and Computer Sciences} 
}

@misc{spec:95,
author = {Kathy Powers and Cathy Sandifer and Dianne Rice and Jason Glick and Bob Cramblitt},
year = {1995},
title = {Standard Performance Evaluation Corporation},
url = {http://www.spec.org/},
}


@inproceedings{ matrix:97,
    author = {Ronald F. Boisvert and Roldan Pozo and Karin Remington and Richard Barrett and Jack J. Dongarra},
    title = {The {Matrix Market}: {A} Web Resource for Test Matrix Collections},
    booktitle = {Quality of Numerical Software, Assessment and Enhancement},
    publisher = {Chapman \& Hall},
    address = {London},
    editor = {Ronald F. Boisvert},
    pages = {125--137},
    year = {1997}}
    

@PhdThesis{sturtevant:03,
        author =         {Nathan R. Sturtevant},
        title =          {Multi-Player Games: Algorithms and Approaches},
        year =           {2003},
        school =         {Computer Science Department, UCLA}}